"""
问题：
[nltk_data] Error loading averaged_perceptron_tagger_eng: <urlopen
[nltk_data]     error [SSL: CERTIFICATE_VERIFY_FAILED] certificate
解决：先离线下载averaged_perceptron_tagger_eng.zip，然后头部加上下面代码，手动在目录下解压不行。
目录： /Users/brightzhou/nltk_data
"""
# import nltk
# import ssl
#
# try:
#     _create_unverified_https_context = ssl._create_unverified_context
# except AttributeError:
#     pass
# else:
#     ssl._create_default_https_context = _create_unverified_https_context
#
# nltk.download('averaged_perceptron_tagger')
""""end"""
"""
加载html
"""
from langchain_community.document_loaders import UnstructuredHTMLLoader

file_path = "../resource/test.html"
loader = UnstructuredHTMLLoader(file_path=file_path, encoding="UTF-8")
data = loader.load()
print(data)
